All
沿指定轴计算张量的逻辑与 (Logical AND)。如果轴上的所有元素都为真(非零),则输出为1.0,否则为0.0。
\[Y_i = \prod_{x \in S_i} B(x)\]
其中 \(S_i\) 是输入张量中用于计算输出 \(Y_i\) 的切片, \(B(x)\) 是一个辅助函数:
\[\begin{split}B(x)=\begin{cases} 1, & \text{if } x \neq 0 \\ 0, & \text{if } x = 0 \end{cases}\end{split}\]
- 输入:
outer_size - 规约轴之前的所有维度大小的乘积。
inner_size - 规约轴之后的所有维度大小的乘积。
axis_size - 规约轴本身的大小。
src_data - 输入数据地址。
core_mask - 核掩码。
- 输出:
dst_data - 输出数据地址。
- 支持平台:
FT78NEMT7004
备注
FT78NE 支持int8, int16, int32, fp32, fp64, cplx64, cplx128
MT7004 支持fp16, fp32, int16, int32, cplx64
共享存储版本:
-
void i8_reduceall_s(int outer_size, int inner_size, int axis_size, int8_t *src_data, int8_t *dst_data, int core_mask)
-
void i16_reduceall_s(int outer_size, int inner_size, int axis_size, int16_t *src_data, int16_t *dst_data, int core_mask)
-
void i32_reduceall_s(int outer_size, int inner_size, int axis_size, int *src_data, int *dst_data, int core_mask)
-
void hp_reduceall_s(int outer_size, int inner_size, int axis_size, half *src_data, half *dst_data, int core_mask)
-
void fp_reduceall_s(int outer_size, int inner_size, int axis_size, float *src_data, float *dst_data, int core_mask)
-
void dp_reduceall_s(int outer_size, int inner_size, int axis_size, double *src_data, double *dst_data, int core_mask)
-
void c64_reduceall_s(int outer_size, int inner_size, int axis_size, float *src_data, float *dst_data, int core_mask)
-
void c128_reduceall_s(int outer_size, int inner_size, int axis_size, double *src_data, double *dst_data, int core_mask)
C调用示例:
1//FT78NE示例
2#include <stdio.h>
3#include <all.h>
4int main(int argc, char* argv[]) {
5 float *src_data = (float *)0xA0000000; //input在DDR空间
6 float *dst_data = (float *)0xB0000000; //output
7 int outer_size = 2;
8 int inner_size = 4;
9 int axis_size = 3;
10 int core_mask = 0xff;
11 fp_reduceall_s(outer_size, inner_size, axis_size, src_data, dst_data, core_mask);
12 return 0;
13}
私有存储版本:
-
void i8_reduceall_p(int outer_size, int inner_size, int axis_size, int8_t *src_data, int8_t *dst_data)
-
void i16_reduceall_p(int outer_size, int inner_size, int axis_size, int16_t *src_data, int16_t *dst_data)
-
void i32_reduceall_p(int outer_size, int inner_size, int axis_size, int *src_data, int *dst_data)
-
void hp_reduceall_p(int outer_size, int inner_size, int axis_size, half *src_data, half *dst_data)
-
void fp_reduceall_p(int outer_size, int inner_size, int axis_size, float *src_data, float *dst_data)
-
void dp_reduceall_p(int outer_size, int inner_size, int axis_size, double *src_data, double *dst_data)
-
void c64_reduceall_p(int outer_size, int inner_size, int axis_size, float *src_data, float *dst_data)
-
void c128_reduceall_p(int outer_size, int inner_size, int axis_size, double *src_data, double *dst_data)
C调用示例:
1//FT78NE示例
2#include <stdio.h>
3#include <all.h>
4int main(int argc, char* argv[]) {
5 float *src_data = (float *)0x10000000; //input在DDR空间
6 float *dst_data = (float *)0x10001000; //output
7 int outer_size = 2;
8 int inner_size = 4;
9 int axis_size = 3;
10 fp_reduceall_p(outer_size, inner_size, axis_size, src_data, dst_data);
11 return 0;
12}